10 年之前 · 0465835da8
--- a/Gemfile
+++ b/Gemfile
@@ -81,6 +81,7 @@ gem 'string-scrub'	# for ruby <2.1
 
                 gem 'therubyracer', '~> 0.12.1'
              
 
                 gem 'typhoeus', '~> 0.6.3'
              
 
                 gem 'uglifier', '>= 1.3.0'
              
 
                +gem 'hypdf', '~> 1.0.7'
              
 
                 
              
 
                 group :development do
              
 
                   gem 'better_errors', '~> 1.1'
              
--- a/Gemfile.lock
+++ b/Gemfile.lock
@@ -174,12 +174,17 @@ GEM
 
                     hipchat (1.2.0)
              
 
                       httparty
              
 
                     hpricot (0.8.6)
              
 
                +    httmultiparty (0.3.10)
              
 
                +      httparty (>= 0.7.3)
              
 
                +      multipart-post
              
 
                     http (0.5.1)
              
 
                       http_parser.rb
              
 
                     http_parser.rb (0.6.0)
              
 
                     httparty (0.13.1)
              
 
                       json (~> 1.8)
              
 
                       multi_xml (>= 0.5.2)
              
 
                +    hypdf (1.0.7)
              
 
                +      httmultiparty (= 0.3.10)
              
 
                     i18n (0.6.11)
              
 
                     jquery-rails (3.1.1)
              
 
                       railties (>= 3.0, < 5.0)
              
@@ -475,6 +480,7 @@ DEPENDENCIES
 
                   guard-rspec
              
 
                   hipchat (~> 1.2.0)
              
 
                   httparty (~> 0.13)
              
 
                +  hypdf (~> 1.0.7)
              
 
                   jquery-rails (~> 3.1.0)
              
 
                   json (~> 1.8.1)
              
 
                   jsonpath (~> 0.5.6)
              
--- a/app/models/agents/pdf_info_agent.rb
+++ b/app/models/agents/pdf_info_agent.rb
@@ -0,0 +1,62 @@
 
                +require 'open-uri'
              
 
                +require 'hypdf'
              
 
                +
              
 
                +module Agents
              
 
                +  class PdfInfoAgent < Agent
              
 
                +
              
 
                +    gem_dependency_check { defined?(HyPDF) }
              
 
                +
              
 
                +    cannot_be_scheduled!
              
 
                +
              
 
                +    description <<-MD
              
 
                +      In order for this agent to work, you need to have [HyPDF](https://devcenter.heroku.com/articles/hypdf) running and configured.
              
 
                +
              
 
                +      It works by acting on events that contain a key `url` in their payload, and runs the [pdfinfo](https://devcenter.heroku.com/articles/hypdf#pdfinfo) command on them.
              
 
                +    MD
              
 
                +
              
 
                +    event_description <<-MD
              
 
                +    This will change based on the metadata in the pdf.
              
 
                +
              
 
                +      { "Title"=>"Everyday Rails Testing with RSpec", 
              
 
                +        "Author"=>"Aaron Sumner",
              
 
                +        "Creator"=>"LaTeX with hyperref package",
              
 
                +        "Producer"=>"xdvipdfmx (0.7.8)",
              
 
                +        "CreationDate"=>"Fri Aug  2 05",
              
 
                +        "32"=>"50 2013",
              
 
                +        "Tagged"=>"no",
              
 
                +        "Pages"=>"150",
              
 
                +        "Encrypted"=>"no",
              
 
                +        "Page size"=>"612 x 792 pts (letter)",
              
 
                +        "Optimized"=>"no",
              
 
                +        "PDF version"=>"1.5",
              
 
                +        "url": "your url"
              
 
                +      }
              
 
                +    MD
              
 
                +
              
 
                +    def working?
              
 
                +      !recent_error_logs?
              
 
                +    end
              
 
                +
              
 
                +    def default_options
              
 
                +      {}
              
 
                +    end
              
 
                +
              
 
                +    def receive(incoming_events)
              
 
                +      incoming_events.each do |event|
              
 
                +        interpolate_with(event) do
              
 
                +          url_to_scrape = event.payload['url']
              
 
                +          check_url(url_to_scrape, event.payload) if url_to_scrape =~ /^https?:\/\//i
              
 
                +        end
              
 
                +      end
              
 
                +    end
              
 
                +
              
 
                +    def check_url(in_url, payload)
              
 
                +      return unless in_url.present?
              
 
                +      Array(in_url).each do |url|
              
 
                +        log "Fetching #{url}"
              
 
                +        info = HyPDF.pdfinfo(open(url))
              
 
                +        create_event :payload => info.merge(payload)
              
 
                +      end
              
 
                +    end
              
 
                +  end
              
 
                +end